package com.shengzai.rdd

import org.apache.spark.rdd.RDD
import org.apache.spark.{SparkConf, SparkContext}

object Demo6Sample {
  def main(args: Array[String]): Unit = {
    val conf = new SparkConf()
    conf.setMaster("local")
    conf.setAppName("Filter")
    val sc = new SparkContext(conf)

    val stuRDD: RDD[String] = sc.textFile("hadoop_code/src/data/students.txt")

    /**
     * 抽样 1%
     */
    stuRDD.sample(false,0.01).foreach(println)
  }



}
